package com.minglead.crawler.constant;

import java.io.File;

public class YqModelAnalysisConstant {
    //文章分类结果数
    public static final int thutctTopN = 1;
    //关键词分析结果数
    public static final int keywordTopN = 5;
    //单个关键词的最小中文数
    public static final int minWordNum = 2;
    //根路径
    public static final String rootPath = "/opt/software/Resources/price_data";
    //分析模型工作路径
    public static final String modelAnalysisJobPath = rootPath + File.separator + "nlp";
    //爬虫工作路径
    public static final String crawlerJobPath = rootPath + File.separator + "crawler";
    //模型分析正文文件来源目录
    public static final String modelAnalysisContentPath = modelAnalysisJobPath + File.separator +"input";
    //模型名称
    //行业分析
    public static final String domainModelName = "nlp_domain_classification_chinese";
    //情感分析
    public static final String sentimentModelName = "nlp_structbert_sentiment-classification_chinese-tiny";
    //类别分析
    public static final String thuctcModelName = "THUCTC2";
    //关键词分析
    public static final String keywordModelName = "TextRank4ZH-master";

    //爬虫代码目录
    public static final String crawlerCodePath = rootPath + File.separator + "jiajian_scrapy";
    //今日头条爬虫工作路径
    public static final String toutiaoBasePath = crawlerCodePath + File.separator + "toutiao_news";
    //微博爬虫工作路径
    public static final String weiboBasePath = crawlerCodePath + File.separator + "weibo-search";
    //小红书爬虫工作路径
    public static final String redBookBasePath = crawlerCodePath + File.separator + "xiaohongshu";
    //中国新闻网爬虫工作路径
    public static final String chinaNewsNetworkBasePath = crawlerCodePath + File.separator + "chinanews";
    //新华网爬虫工作路径
    public static final String xinhuaBasePath = crawlerCodePath + File.separator + "xinhuanet";
    //腾讯新闻爬虫工作路径
    public static final String tencentBasePath = crawlerCodePath + File.separator + "tencent_news";
    //腾讯新闻爬虫工作路径
    public static final String sougouWechatBasePath = crawlerCodePath + File.separator + "sougou-wechat";
    //新浪财经爬虫工作路径
    public static final String financeSinaBasePath = crawlerCodePath + File.separator + "finance-sina";
    //芝加哥期货交易所爬虫工作路径
    public static final String cbotBasePath = crawlerCodePath + File.separator + "cbot";
    //上海国际能源交易中心爬虫工作路径
    public static final String ineDailyBasePath = crawlerCodePath + File.separator + "ine-daily";
    //广东省统计局国民经济主要指标爬虫工作路径
    public static final String gdNationalBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdNational";
    //广东省统计局广东省季度生产总值爬虫工作路径
    public static final String gdQuarterBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdQuarter";
    //广东省统计局蔬菜瓜果生产情况爬虫工作路径
    public static final String gdSituationBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdSituation";
    //广东省统计局工业增加值爬虫工作路径
    public static final String gdAddBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdAdd";
    //广东省统计局主要产品产量爬虫工作路径
    public static final String gdProductionBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdProduction";
    //广东省统计局工业主要经济指标爬虫工作路径
    public static final String gdIndustryBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdIndustry";
    //广东省统计局社会消费品零售总额爬虫工作路径
    public static final String gdTotalBasePath = crawlerCodePath + File.separator + "stats-gd-gov-gdTotal";

    //各媒体ret文件路径
    public static final String TOUTIAO_RET_PATH = toutiaoBasePath + File.separator + "ret";
    public static final String WEIBO_RET_PATH = weiboBasePath + File.separator + "ret";
    public static final String XIAOHONGSHU_RET_PATH = redBookBasePath + File.separator + "ret";
    public static final String CHINANEWSNETWORK_RET_PATH = chinaNewsNetworkBasePath + File.separator + "ret";
    public static final String XINHUA_RET_PATH = xinhuaBasePath + File.separator + "ret";
    public static final String TENCENT_RET_PATH = tencentBasePath + File.separator + "ret";
    public static final String SOUGOUWECHAT_RET_PATH = sougouWechatBasePath + File.separator + "ret";
    public static final String FINANCESINA_RET_PATH = financeSinaBasePath + File.separator + "ret";
    public static final String CBOT_RET_PATH = cbotBasePath + File.separator + "ret";
    public static final String INEDAILY_RET_PATH = ineDailyBasePath + File.separator + "ret";
    public static final String GD_NATIONAL_RET_PATH = gdNationalBasePath + File.separator + "ret";
    public static final String GD_QUARTER_RET_PATH = gdQuarterBasePath + File.separator + "ret";
    public static final String GD_SITUATION_RET_PATH = gdSituationBasePath + File.separator + "ret";
    public static final String GD_ADD_RET_PATH = gdAddBasePath + File.separator + "ret";
    public static final String GD_PRODUCTION_RET_PATH = gdProductionBasePath + File.separator + "ret";
    public static final String GD_INDUSTRY_RET_PATH = gdIndustryBasePath + File.separator + "ret";
    public static final String GD_TOTAL_RET_PATH = gdTotalBasePath + File.separator + "ret";

    //conda目录
    public static final String CONDA_PATH = rootPath + File.separator + "conda_env";

    //替代source /home/gosadmin/.bashrc;
    public static final String SOURCE_PATH =
            "__conda_setup=\"$('conda' 'shell.bash' 'hook' 2> /dev/null)\"\n" +
            "if [ $? -eq 0 ]; then\n" +
            "    eval \"$__conda_setup\"\n" +
            "fi\n";

    //归档文件父目录
    public static final String gdProvinceStatisticsDir = rootPath + "/crawler/dataFile/gdProvinceStatistics";
    //归档文件路径
    public static final String gdNationalGuidangDir = gdProvinceStatisticsDir + File.separator + "gdNational";
    public static final String gdQuarterGuidangDir = gdProvinceStatisticsDir + File.separator + "gdQuarter";
    public static final String gdSituationGuidangDir = gdProvinceStatisticsDir + File.separator + "gdSituation";
    public static final String gdAddGuidangDir = gdProvinceStatisticsDir + File.separator + "gdAdd";
    public static final String gdProductionGuidangDir = gdProvinceStatisticsDir + File.separator + "gdProduction";
    public static final String gdIndustryGuidangDir = gdProvinceStatisticsDir + File.separator + "gdIndustry";
    public static final String gdTotalGuidangDir = gdProvinceStatisticsDir + File.separator + "gdTotal";

    //爬虫抓取网址
    public static final String FINANCESINA_ADDRESS = "https://finance.sina.com.cn/money/future/hf.html";
    public static final String CBOT_ADDRESS = "https://quote.stockstar.com/futures/cbot.html";
    public static final String INEDAILY_ADDRESS = "https://www.ine.cn/";
    public static final String GD_NATIONAL_ADDRESS = "http://stats.gd.gov.cn/gmjjzyzb/index.html";
    public static final String GD_QUARTERL_ADDRESS = "http://stats.gd.gov.cn/jdgnsczz/index.html";
    public static final String GD_SITUATION_ADDRESS = "http://stats.gd.gov.cn/scggscqk/index.html";
    public static final String GD_ADD_ADDRESS = "http://stats.gd.gov.cn/gyzjz/index.html";
    public static final String GD_PRODUCTION_ADDRESS = "http://stats.gd.gov.cn/gyzjz/index.html";
    public static final String GD_INDUSTRY_ADDRESS = "http://stats.gd.gov.cn/gyzyjjzb/index.html";
    public static final String GD_TOTAL_ADDRESS = "http://stats.gd.gov.cn/shxfplsze/index.html";

}
